{i18n.t("bench.detail.title", { task: taskId })}

{i18n.t("bench.detail.notFound")}

{i18n.t("bench.detail.labels.agent")}: {task()?.agent ?? i18n.t("bench.detail.na")}

{i18n.t("bench.detail.labels.model")}: {task()?.model ?? i18n.t("bench.detail.na")}

{i18n.t("bench.detail.labels.task")}: {task()!.task.id}

{i18n.t("bench.detail.labels.repo")}: {task()!.task.source.repo}

{i18n.t("bench.detail.labels.from")}: {task()!.task.source.from.slice(0, 7)}

{i18n.t("bench.detail.labels.to")}: {task()!.task.source.to.slice(0, 7)}

0}>

{i18n.t("bench.detail.labels.prompt")}: {(p) => (

{i18n.t("bench.detail.labels.commit")}: {p.commit.slice(0, 7)}

{p.prompt}

)}

{i18n.t("bench.detail.labels.averageDuration")}: {task()?.averageDuration ? formatDuration(task()!.averageDuration!) : i18n.t("bench.detail.na")}

{i18n.t("bench.detail.labels.averageScore")}: {task()?.averageScore?.toFixed(3) ?? i18n.t("bench.detail.na")}

{i18n.t("bench.detail.labels.averageCost")}: {task()?.averageUsage?.cost ? `$${task()!.averageUsage!.cost.toFixed(4)}` : i18n.t("bench.detail.na")}

{i18n.t("bench.detail.labels.summary")}:

{task()!.summary}

0}>

{i18n.t("bench.detail.labels.runs")}: {(detail) => ( )} {(run, index) => ( {(detail) => ( )} )}

{i18n.t("bench.detail.table.run")}	{i18n.t("bench.detail.table.score")}	{i18n.t("bench.detail.table.cost")}	{i18n.t("bench.detail.table.duration")}	{detail.criterion} ({detail.weight})
{index() + 1}	{run.score.final.toFixed(3)} ({run.score.base.toFixed(3)} - {run.score.penalty.toFixed(3)})	{run.usage?.cost ? `$${run.usage.cost.toFixed(4)}` : i18n.t("bench.detail.na")}	{run.duration ? formatDuration(run.duration) : i18n.t("bench.detail.na")}	{(judge) => ( {judge.score === 1 ? "✓" : judge.score === 0 ? "✗" : judge.score} )}

{(run, index) => (

{i18n.t("bench.detail.run.title", { n: index() + 1 })}

{i18n.t("bench.detail.labels.score")}: {run.score.final.toFixed(3)} ({i18n.t("bench.detail.labels.base")}: {run.score.base.toFixed(3)} -{" "} {i18n.t("bench.detail.labels.penalty")}: {run.score.penalty.toFixed(3)})

{(detail) => (

{detail.criterion} ({i18n.t("bench.detail.labels.weight")}: {detail.weight}){" "} {(judge) => ( {judge.score === 1 ? "✓" : judge.score === 0 ? "✗" : judge.score} )}

0}> {(judge) => { const [expanded, setExpanded] = createSignal(false) return (

setExpanded(!expanded())} > {expanded() ? "▼" : "▶"} {judge.score === 1 ? "✓" : judge.score === 0 ? "✗" : judge.score} {" "} {judge.judge}

{judge.rationale}

) }}

)}

{(() => { const [jsonExpanded, setJsonExpanded] = createSignal(false) return (

{JSON.stringify(task(), null, 2)}

) })()}